from pyspark.sql.types import StructType,StructField,StringType

class SchemaLoader:
    # movie的schema信息
    movieSchema=StructType([
        StructField("movieId", StringType(), True),
        StructField("title", StringType(), True),
        StructField("genres", StringType(), True)
    ])

    # rating的schema信息
    ratingSchema = StructType([
        StructField("userId", StringType(), True),
        StructField("movieId", StringType(), True),
        StructField("rating", StringType(), True),
        StructField("timestamp", StringType(), True)
    ])




